from numba import cuda
import multiprocessing
import numpy as np

@cuda.jit
def test(arr):
    temp=arr[1][1]

arr_h=np.arange(0,6,1)
arr_d=cuda.to_device(arr_h)
arr_temp_d=arr_d.reshape(2,3)
test[(2,3),(3,4)](arr_temp_d)